Things to keep track of:

Experiment 1

Quick off the shelf experiment of a simple two-stage trial design.

setwd("/Users/Nikki/Dropbox/UNC/Causal NLP/")
The working directory was changed to /Users/Nikki/Dropbox/UNC/Causal NLP inside a notebook chunk. The working directory will be reset when the chunk is finished running. Use the knitr root.dir option in the setup chunk to change the working directory for notebook chunks.
rebackDTM <- read_csv("Reback_TxtLibrary/RebackDTM.csv")
Parsed with column specification:
cols(
  .default = col_double(),
  msgID = col_character()
)
See spec(...) for full column specifications.
# A little pre-processing
rebackDTM <- 
  rebackDTM %>% select(-c("________", "_________", "0880", "1", "10pm", "12", 
                        "1600", "1625", "1990", "201", "213", "2400", "262",
                        "3", "30", "323", "3393", "4343", "463", "483", "4x",
                        "5", "50", "5366", "5395", "5880", "6", "6100", "626",
                        "653", "660", "6691", "7001", "758", "7669", "769",
                        "800", "860", "877", "9.95", "933", "936", "993", 
                        "aa", "www.friendsgettingoff.org")) %>%
  mutate(ass = ass + asses, 
         blow = blow + blows, 
         bareback = bareback + barebacking,
         beat = beat + beats,
         bootybump = bootybump + bootybumps,
         bottom = bottom + bottomed + bottoming + bottoms,
         boundary = boundary + boundaries,
         boy = boy + boys,
         brush = brush + brushed,
         bump = bump + bumps,
         bug = bug + bugs,
         bring = bring + brings,
         chance = chance + chances,
         choice = choice + choices,
         clean = clean + cleaner + cleaning,
         commit = commit + commitment,
         condom = condom + condoms + condomize,
         cruise = cruise + cruising, 
         day = day + daily,
         disclose = disclose + disclosure,
         dose = dose + doses + dosing,
         easy = easy + easier,
         feel = feel + feeling,
         hepatitis = hep + hepatitis,
         live = live + living,
         low = low + lower + lowered + lowers,
         med = med + meds,
         meth = meth + methed,
         party = party + partying,
         partner = partner + partners,
         pharmacy = pharmacy + pharmacist,
         positive = positive + poz,
         protect = protect + protecting + protection,
         safe = safe + safer,
         speed = speed + speeds,
         sex = sex + sexy,
         skip = skip + skipping,
         std = std + stds,
         strong = strong + stronger,
         treat = treat + treatment) %>%
  select(-c(asses, blows, barebacking, beats, bootybumps,
            brushed, bottomed, bottoming, bottoms, boundaries, boys,
           bumps, bugs, chances, brings, choices, cleaner,
           cleaning, commitment, condoms, condomize, cruising, 
           daily, doses,
           dosing, disclosure, easier, hep, living, methed,
           meds, partying, partners, pharmacist, safer, speeds, sexy,
           lower, lowered, lowers, poz, feeling,
           protecting, protection, skipping, stronger,
           stds, treatment))
mean(poliblog.ratings[trainingSet]/100)
[1] -0.1398964
LS0tCnRpdGxlOiAiUiBOb3RlYm9vayIKb3V0cHV0OiBodG1sX25vdGVib29rCi0tLQoKVGhpbmdzIHRvIGtlZXAgdHJhY2sgb2Y6CgogICogTnVtYmVyIG9mIHBhcnRpY2lwYW50cyBpbiBlYWNoIHN0YWdlCiAgKiBOdW1iZXIgb2YgdGltZXMgdGhhdCB0aGUgb3V0Y29tZSBpcyBjb2xsZWN0ZWQKICAqIE51bWJlciBvZiB0ZXh0czpvdXRjb21lcyBjb2xsZWN0ZWQKICAqIFNpemUgb2YgY29ycHVzOm51bWJlciBvZiBvdXRjb21lcyBmb3IgZWFjaCBkb2N1bWVudAoKYGBge3IsIGVjaG8gPSBGQUxTRSwgcmVzdWx0cyA9ICdoaWRlJywgbWVzc2FnZSA9IEZBTFNFLCB3YXJuaW5nID0gRkFMU0UsIGluY2x1ZGUgPSBGQUxTRX0KbGlicmFyeShsZGEpCmxpYnJhcnkodGlkeXZlcnNlKQpgYGAKICAKIyMgRXhwZXJpbWVudCAxCgpRdWljayBvZmYgdGhlIHNoZWxmIGV4cGVyaW1lbnQgb2YgYSBzaW1wbGUgdHdvLXN0YWdlIHRyaWFsIGRlc2lnbi4gCgpgYGB7cn0Kc2V0d2QoIi9Vc2Vycy9OaWtraS9Ecm9wYm94L1VOQy9DYXVzYWwgTkxQLyIpCnJlYmFja0RUTSA8LSByZWFkX2NzdigiUmViYWNrX1R4dExpYnJhcnkvUmViYWNrRFRNLmNzdiIpCgojIEEgbGl0dGxlIHByZS1wcm9jZXNzaW5nCnJlYmFja0RUTSA8LSAKICByZWJhY2tEVE0gJT4lIHNlbGVjdCgtYygiX19fX19fX18iLCAiX19fX19fX19fIiwgIjA4ODAiLCAiMSIsICIxMHBtIiwgIjEyIiwgCiAgICAgICAgICAgICAgICAgICAgICAgICIxNjAwIiwgIjE2MjUiLCAiMTk5MCIsICIyMDEiLCAiMjEzIiwgIjI0MDAiLCAiMjYyIiwKICAgICAgICAgICAgICAgICAgICAgICAgIjMiLCAiMzAiLCAiMzIzIiwgIjMzOTMiLCAiNDM0MyIsICI0NjMiLCAiNDgzIiwgIjR4IiwKICAgICAgICAgICAgICAgICAgICAgICAgIjUiLCAiNTAiLCAiNTM2NiIsICI1Mzk1IiwgIjU4ODAiLCAiNiIsICI2MTAwIiwgIjYyNiIsCiAgICAgICAgICAgICAgICAgICAgICAgICI2NTMiLCAiNjYwIiwgIjY2OTEiLCAiNzAwMSIsICI3NTgiLCAiNzY2OSIsICI3NjkiLAogICAgICAgICAgICAgICAgICAgICAgICAiODAwIiwgIjg2MCIsICI4NzciLCAiOS45NSIsICI5MzMiLCAiOTM2IiwgIjk5MyIsIAogICAgICAgICAgICAgICAgICAgICAgICAiYWEiLCAid3d3LmZyaWVuZHNnZXR0aW5nb2ZmLm9yZyIpKSAlPiUKICBtdXRhdGUoYXNzID0gYXNzICsgYXNzZXMsIAogICAgICAgICBibG93ID0gYmxvdyArIGJsb3dzLCAKICAgICAgICAgYmFyZWJhY2sgPSBiYXJlYmFjayArIGJhcmViYWNraW5nLAogICAgICAgICBiZWF0ID0gYmVhdCArIGJlYXRzLAogICAgICAgICBib290eWJ1bXAgPSBib290eWJ1bXAgKyBib290eWJ1bXBzLAogICAgICAgICBib3R0b20gPSBib3R0b20gKyBib3R0b21lZCArIGJvdHRvbWluZyArIGJvdHRvbXMsCiAgICAgICAgIGJvdW5kYXJ5ID0gYm91bmRhcnkgKyBib3VuZGFyaWVzLAogICAgICAgICBib3kgPSBib3kgKyBib3lzLAogICAgICAgICBicnVzaCA9IGJydXNoICsgYnJ1c2hlZCwKICAgICAgICAgYnVtcCA9IGJ1bXAgKyBidW1wcywKICAgICAgICAgYnVnID0gYnVnICsgYnVncywKICAgICAgICAgYnJpbmcgPSBicmluZyArIGJyaW5ncywKICAgICAgICAgY2hhbmNlID0gY2hhbmNlICsgY2hhbmNlcywKICAgICAgICAgY2hvaWNlID0gY2hvaWNlICsgY2hvaWNlcywKICAgICAgICAgY2xlYW4gPSBjbGVhbiArIGNsZWFuZXIgKyBjbGVhbmluZywKICAgICAgICAgY29tbWl0ID0gY29tbWl0ICsgY29tbWl0bWVudCwKICAgICAgICAgY29uZG9tID0gY29uZG9tICsgY29uZG9tcyArIGNvbmRvbWl6ZSwKICAgICAgICAgY3J1aXNlID0gY3J1aXNlICsgY3J1aXNpbmcsIAogICAgICAgICBkYXkgPSBkYXkgKyBkYWlseSwKICAgICAgICAgZGlzY2xvc2UgPSBkaXNjbG9zZSArIGRpc2Nsb3N1cmUsCiAgICAgICAgIGRvc2UgPSBkb3NlICsgZG9zZXMgKyBkb3NpbmcsCiAgICAgICAgIGVhc3kgPSBlYXN5ICsgZWFzaWVyLAogICAgICAgICBmZWVsID0gZmVlbCArIGZlZWxpbmcsCiAgICAgICAgIGhlcGF0aXRpcyA9IGhlcCArIGhlcGF0aXRpcywKICAgICAgICAgbGl2ZSA9IGxpdmUgKyBsaXZpbmcsCiAgICAgICAgIGxvdyA9IGxvdyArIGxvd2VyICsgbG93ZXJlZCArIGxvd2VycywKICAgICAgICAgbWVkID0gbWVkICsgbWVkcywKICAgICAgICAgbWV0aCA9IG1ldGggKyBtZXRoZWQsCiAgICAgICAgIHBhcnR5ID0gcGFydHkgKyBwYXJ0eWluZywKICAgICAgICAgcGFydG5lciA9IHBhcnRuZXIgKyBwYXJ0bmVycywKICAgICAgICAgcGhhcm1hY3kgPSBwaGFybWFjeSArIHBoYXJtYWNpc3QsCiAgICAgICAgIHBvc2l0aXZlID0gcG9zaXRpdmUgKyBwb3osCiAgICAgICAgIHByb3RlY3QgPSBwcm90ZWN0ICsgcHJvdGVjdGluZyArIHByb3RlY3Rpb24sCiAgICAgICAgIHNhZmUgPSBzYWZlICsgc2FmZXIsCiAgICAgICAgIHNwZWVkID0gc3BlZWQgKyBzcGVlZHMsCiAgICAgICAgIHNleCA9IHNleCArIHNleHksCiAgICAgICAgIHNraXAgPSBza2lwICsgc2tpcHBpbmcsCiAgICAgICAgIHN0ZCA9IHN0ZCArIHN0ZHMsCiAgICAgICAgIHN0cm9uZyA9IHN0cm9uZyArIHN0cm9uZ2VyLAogICAgICAgICB0cmVhdCA9IHRyZWF0ICsgdHJlYXRtZW50KSAlPiUKICBzZWxlY3QoLWMoYXNzZXMsIGJsb3dzLCBiYXJlYmFja2luZywgYmVhdHMsIGJvb3R5YnVtcHMsCiAgICAgICAgICAgIGJydXNoZWQsIGJvdHRvbWVkLCBib3R0b21pbmcsIGJvdHRvbXMsIGJvdW5kYXJpZXMsIGJveXMsCiAgICAgICAgICAgYnVtcHMsIGJ1Z3MsIGNoYW5jZXMsIGJyaW5ncywgY2hvaWNlcywgY2xlYW5lciwKICAgICAgICAgICBjbGVhbmluZywgY29tbWl0bWVudCwgY29uZG9tcywgY29uZG9taXplLCBjcnVpc2luZywgCiAgICAgICAgICAgZGFpbHksIGRvc2VzLAogICAgICAgICAgIGRvc2luZywgZGlzY2xvc3VyZSwgZWFzaWVyLCBoZXAsIGxpdmluZywgbWV0aGVkLAogICAgICAgICAgIG1lZHMsIHBhcnR5aW5nLCBwYXJ0bmVycywgcGhhcm1hY2lzdCwgc2FmZXIsIHNwZWVkcywgc2V4eSwKICAgICAgICAgICBsb3dlciwgbG93ZXJlZCwgbG93ZXJzLCBwb3osIGZlZWxpbmcsCiAgICAgICAgICAgcHJvdGVjdGluZywgcHJvdGVjdGlvbiwgc2tpcHBpbmcsIHN0cm9uZ2VyLAogICAgICAgICAgIHN0ZHMsIHRyZWF0bWVudCkpCgojIEdldCBhIHZlY3RvciBvZiB0aGUgdm9jYWJ1bGFyeQp2b2NhYiA8LSByZWJhY2tEVE0gJT4lIGZpbHRlcihzdHJfZGV0ZWN0KG1zZ0lELCAiXkF8XkIiKSkgJT4lCiAgc3VtbWFyaXNlX2F0KC52YXJzID0gdmFycyhhYmJleTp3b3J0aCksIHN1bSkgJT4lCiAgcGl2b3RfbG9uZ2VyKG5hbWVzX3RvID0gIndvcmQiLCB2YWx1ZXNfdG8gPSAiY291bnQiLCBjb2xzID0gYWJiZXk6d29ydGgpICU+JQogIGZpbHRlcihjb3VudCA+IDApICU+JQogIHNlbGVjdCh3b3JkKSAlPiUKICB1bmxpc3QoKQp2b2NhYiA8LSB1bm5hbWUodm9jYWIpCnZvY2FiREYgPC0gZGF0YS5mcmFtZSh3b3JkID0gdm9jYWIsIHdvcmROdW0gPSBzZXFfYWxvbmcodm9jYWIpKQoKIyBLZWVwIG9ubHkgdGhlIHZvY2FiIGluIHRoZSB0ZXh0IGJlaW5nIGFuYWx5emVkCiMgTGFzdCBiaXQgb2YgcHJlLXByb2Nlc3NpbmcKZHRtIDwtIHJlYmFja0RUTSAlPiUgZmlsdGVyKHN0cl9kZXRlY3QobXNnSUQsICJeQXxeQiIpKSAlPiUKICBzZWxlY3QobXNnSUQsIGFsbF9vZih2b2NhYikpICU+JQogIHNlbGVjdCgtYGRvZXNu4oCZdGApJT4lCiAgc2VsZWN0KC1gZG9u4oCZdGApCgoKCmRvY3VtZW50cyA8LSBkdG0gJT4lCiAgcGl2b3RfbG9uZ2VyKGNvbHMgPSBhZGQ6d29ydGgsIG5hbWVzX3RvID0gIndvcmQiLCB2YWx1ZXNfdG8gPSAiY291bnQiKSAlPiUKICBsZWZ0X2pvaW4odm9jYWJERiwgYnkgPSAid29yZCIpICU+JQogIG11dGF0ZSh3b3JkTnVtID0gd29yZE51bSAtIDEpICU+JQogIHNlbGVjdCgtd29yZCkgJT4lCiAgc2VsZWN0KG1zZ0lELCB3b3JkTnVtLCBjb3VudCkgJT4lCiAgZmlsdGVyKGNvdW50ID4gMCkgJT4lCiAgZ3JvdXBfYnkobXNnSUQpICU+JQogIG5lc3QoKSAlPiUKICBtdXRhdGUoZG9jdW1lbnRfbWF0cml4ID0gbWFwKGRhdGEsIGFzLm1hdHJpeCkpICU+JQogIG11dGF0ZShkb2N1bWVudF9tYXRyaXggPSBtYXAoZG9jdW1lbnRfbWF0cml4LCB0KSkgJT4lCiAgbXV0YXRlKGRvY3VtZW50X21hdHJpeCA9IG1hcChkb2N1bWVudF9tYXRyaXgsIHVubmFtZSkpCgpvdXRjb21lcyA8LSBkb2N1bWVudHMgJT4lIHNlbGVjdChtc2dJRCkgJT4lCiAgZGlzdGluY3QoKSAlPiUKICByb3d3aXNlKCkgJT4lCiAgbXV0YXRlKFkgPSBpZl9lbHNlKHN0cl9kZXRlY3QobXNnSUQsICJeQSIpLCBybm9ybSgxLCA1LCAyKSwgcm5vcm0oMSwgMCwgMikpKQoKCnNsZGEuZW0oZG9jdW1lbnRzID0gZG9jdW1lbnRzJGRvY3VtZW50X21hdHJpeCwgCiAgICAgICAgSyA9IDIsIAogICAgICAgIHZvY2FiID0gdm9jYWIsCiAgICAgICAgbnVtLmUuaXRlcmF0aW9ucyA9IDEwLCAKICAgICAgICBudW0ubS5pdGVyYXRpb25zID0gNCwKICAgICAgICBhbHBoYSA9IDEuMCwgZXRhID0gMC4xLAogICAgICAgIGFubm90YXRpb25zID0gb3V0Y29tZXMkWSwgdmFyaWFuY2UgPSAxLCAKICAgICAgICBsb2dpc3RpYyA9IEZBTFNFLAogICAgICAgIHBhcmFtcyA9IGMoMSwgMSkpCmBgYAoKYGBge3J9CiMjIFVzZSB0aGUgcG9saXRpY2FsIGJsb2dzIGRhdGEgc2V0LgpkYXRhKHBvbGlibG9nLmRvY3VtZW50cykKCmRhdGEocG9saWJsb2cudm9jYWIpCgpkYXRhKHBvbGlibG9nLnJhdGluZ3MpCgpudW0udG9waWNzIDwtIDEwCgojIyBEaXZpZGUgaW4gaGFsZgp0cmFpbmluZ1NldCA8LSBzYW1wbGUoeCA9IDE6bGVuZ3RoKHBvbGlibG9nLmRvY3VtZW50cyksIHNpemUgPSBsZW5ndGgocG9saWJsb2cuZG9jdW1lbnRzKS8yLS41KQp0ZXN0U2V0IDwtIDE6bGVuZ3RoKHBvbGlibG9nLmRvY3VtZW50cykKdGVzdFNldCA8LSB0ZXN0U2V0WyEoMTpsZW5ndGgocG9saWJsb2cuZG9jdW1lbnRzKSAlaW4lIHRyYWluaW5nU2V0KV0KCiMjIEluaXRpYWxpemUgdGhlIHBhcmFtcwpwYXJhbXMgPC0gc2FtcGxlKGMoLTEsIDEpLCBudW0udG9waWNzLCByZXBsYWNlPVRSVUUpCgpyZXN1bHQgPC0gc2xkYS5lbShkb2N1bWVudHM9cG9saWJsb2cuZG9jdW1lbnRzW3RyYWluaW5nU2V0XSwKICAgICAgICAgICAgICAgICAgIEs9bnVtLnRvcGljcywKICAgICAgICAgICAgICAgICAgIHZvY2FiPXBvbGlibG9nLnZvY2FiLAogICAgICAgICAgICAgICAgICAgbnVtLmUuaXRlcmF0aW9ucz0xMCwKICAgICAgICAgICAgICAgICAgIG51bS5tLml0ZXJhdGlvbnM9NCwKICAgICAgICAgICAgICAgICAgIGFscGhhPTEuMCwgZXRhPTAuMSwKICAgICAgICAgICAgICAgICAgIHBvbGlibG9nLnJhdGluZ3NbdHJhaW5pbmdTZXRdIC8gMTAwLAogICAgICAgICAgICAgICAgICAgcGFyYW1zLAogICAgICAgICAgICAgICAgICAgdmFyaWFuY2U9MC4yNSwKICAgICAgICAgICAgICAgICAgIGxhbWJkYT0xLjAsCiAgICAgICAgICAgICAgICAgICBsb2dpc3RpYz1GQUxTRSwKICAgICAgICAgICAgICAgICAgIG1ldGhvZD0ic0xEQSIpCgoKCiMjIE1ha2UgYSBwcmV0dHkgcGljdHVyZS4KcmVxdWlyZSgiZ2dwbG90MiIpCgpUb3BpY3MgPC0gYXBwbHkodG9wLnRvcGljLndvcmRzKHJlc3VsdCR0b3BpY3MsIDUsIGJ5LnNjb3JlPVRSVUUpLAogICAgICAgICAgICAgICAgMiwgcGFzdGUsIGNvbGxhcHNlPSIgIikKCmNvZWZzIDwtIGRhdGEuZnJhbWUoY29lZihzdW1tYXJ5KHJlc3VsdCRtb2RlbCkpKQoKdGhlbWVfc2V0KHRoZW1lX2J3KCkpCgpjb2VmcyA8LSBjYmluZChjb2VmcywgVG9waWNzPWZhY3RvcihUb3BpY3MsIFRvcGljc1tvcmRlcihjb2VmcyRFc3RpbWF0ZSldKSkKCmNvZWZzIDwtIGNvZWZzW29yZGVyKGNvZWZzJEVzdGltYXRlKSxdCgpxcGxvdChUb3BpY3MsIEVzdGltYXRlLCBjb2xvdXI9RXN0aW1hdGUsIHNpemU9YWJzKHQudmFsdWUpLCBkYXRhPWNvZWZzKSArCiAgZ2VvbV9lcnJvcmJhcih3aWR0aD0wLjUsIGFlcyh5bWluPUVzdGltYXRlLVN0ZC4uRXJyb3IsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICB5bWF4PUVzdGltYXRlK1N0ZC4uRXJyb3IpKSArIGNvb3JkX2ZsaXAoKQoKcHJlZGljdGlvbnMgPC0gc2xkYS5wcmVkaWN0KHBvbGlibG9nLmRvY3VtZW50cywKICAgICAgICAgICAgICAgICAgICAgICAgICAgICByZXN1bHQkdG9waWNzLAogICAgICAgICAgICAgICAgICAgICAgICAgICAgIHJlc3VsdCRtb2RlbCwKICAgICAgICAgICAgICAgICAgICAgICAgICAgICBhbHBoYSA9IDEuMCwKICAgICAgICAgICAgICAgICAgICAgICAgICAgICBldGE9MC4xKQoKcXBsb3QocHJlZGljdGlvbnMsCiAgICAgICBmaWxsPWZhY3Rvcihwb2xpYmxvZy5yYXRpbmdzKSwKICAgICAgIHhsYWIgPSAicHJlZGljdGVkIHJhdGluZyIsCiAgICAgICB5bGFiID0gImRlbnNpdHkiLAogICAgICAgYWxwaGE9SSgwLjUpLAogICAgICAgZ2VvbT0iZGVuc2l0eSIpICsKICAgZ2VvbV92bGluZShhZXMoeGludGVyY2VwdD0wKSkgKwogICB0aGVtZShsZWdlbmQucG9zaXRpb24gPSAibm9uZSIpCgojID4gcHJlZGljdGVkLmRvY3N1bXMgPC0gc2xkYS5wcmVkaWN0LmRvY3N1bXMocG9saWJsb2cuZG9jdW1lbnRzLAojICsgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgcmVzdWx0JHRvcGljcywgCiMgKyAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICBhbHBoYSA9IDEuMCwKIyArICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIGV0YT0wLjEpCiMgCiMgPiBwcmVkaWN0ZWQucHJvcG9ydGlvbnMgPC0gdChwcmVkaWN0ZWQuZG9jc3VtcykgLyBjb2xTdW1zKHByZWRpY3RlZC5kb2NzdW1zKQojIApxcGxvdChgVG9waWMgMWAsIGBUb3BpYyAyYCwKICAgICAgZGF0YSA9IHN0cnVjdHVyZShkYXRhLmZyYW1lKHByZWRpY3RlZC5wcm9wb3J0aW9ucyksCiAgICAgICAgICAgICAgICAgICAgICAgbmFtZXMgPSBwYXN0ZSgiVG9waWMiLCAxOjEwKSksCiAgICAgIHNpemUgPSBgVG9waWMgM2ApCgpwcmVkaWN0ZWRWYWx1ZXMgPC0gdW5saXN0KG1hcChyZXN1bHQkYXNzaWdubWVudHMsIGZ1bmN0aW9uKGFzc2lnbm1lbnQpe3JldHVybihzdW0oYXNzaWdubWVudCA9PSAyKS9sZW5ndGgoYXNzaWdubWVudCkpfSkpIAp0b3BEb2NzIDwtIHdoaWNoKHByZWRpY3RlZFZhbHVlcyA+IDAuMjUpCm1lYW4ocG9saWJsb2cucmF0aW5nc1t0cmFpbmluZ1NldFt0b3BEb2NzXV0vMTAwKQptZWFuKHBvbGlibG9nLnJhdGluZ3NbdHJhaW5pbmdTZXRdLzEwMCkKYGBgCgpgYGB7cn0KcmViYWNrRFRNCmBgYAo=